version=$1
sample_merge='false'
for seq_len in 16384; 
#for seq_len in 32768; 
do
#	python scripts/preprocess_json_glm4.py data/data_v${version}.valid.jsonl.${seq_len}.hunyuan.json.ep1 ${seq_len} false
	python scripts/preprocess_json_qwen2.py data/data_v${version}.valid.jsonl.${seq_len}.hunyuan.json.ep1 ${seq_len} false
#	python scripts/preprocess_json_glm4.py data/data_v${version}.train.jsonl.${seq_len}.hunyuan.json.ep1 ${seq_len} true
#	python scripts/preprocess_json_qwen2.py data/data_v${version}.train.jsonl.${seq_len}.hunyuan.json.ep1 ${seq_len} true
done
